Personal Computer World 2008 February

home *** CD-ROM | disk | FTP | other *** search

/ Personal Computer World 2008 February / PCWFEB08.iso / Software / Freeware / Miro 1.0 / Miro_Installer.exe / Miro_Downloader.exe / subscription.pyc (.txt) < prev next >

Wrap

Python Compiled Bytecode | 2007-11-12 | 5.1 KB | 187 lines

# Source Generated with Decompyle++ # File: in.pyc (Python 2.5) import cgi import re import util import urllib2 import urlparse import xml.dom.minidom as xml reflexiveAutoDiscoveryOpener = urllib2.urlopen def parseFile(path): try: subscriptionFile = open(path, 'r') content = subscriptionFile.read() subscriptionFile.close() return parseContent(content) except: pass def parseContent(content): try: dom = xml.dom.minidom.parseString(content) root = dom.documentElement if root.nodeName == 'rss': urls = _getSubscriptionsFromRSSChannel(root) elif root.nodeName == 'feed': urls = _getSubscriptionsFromAtomFeed(root) elif root.nodeName == 'opml': urls = _getSubscriptionsFromOPMLOutline(root) else: urls = None dom.unlink() return urls except: import traceback if util.chatter: print 'WARNING: Error parsing OPML content...' traceback.print_exc() return None def get_urls_from_query(query): urls = [] for key, value in cgi.parse_qs(query).items(): if re.match('url\\d+$', key): urls.append(value[0]) continue return urls def findSubscribeLinks(url): """Given a URL, test if it's trying to subscribe the user using subscribe.getdemocracy.com. Returns the list of parsed URLs. """ try: (scheme, host, path, params, query, frag) = urlparse.urlparse(url) except: return ('none', []) if host not in ('subscribe.getdemocracy.com', 'subscribe.getmiro.com'): return ('none', []) if path in ('/', '/opml.php'): return ('feed', get_urls_from_query(query)) elif path in ('/download.php', '/download', '/download/'): return ('download', get_urls_from_query(query)) elif path in ('/channelguide.php', '/channelguide', '/channelguide/'): return ('guide', get_urls_from_query(query)) else: return ('feed', [ urllib2.unquote(path[1:])]) def _getSubscriptionsFromRSSChannel(root): try: channel = root.getElementsByTagName('channel').pop() urls = _getSubscriptionsFromAtomLinkConstruct(channel) if urls is not None: return urls else: link = channel.getElementsByTagName('link').pop() href = link.firstChild.data return _getSubscriptionsFromReflexiveAutoDiscovery(href, 'application/rss+xml') except: pass def _getSubscriptionsFromAtomFeed(root): try: urls = _getSubscriptionsFromAtomLinkConstruct(root) if urls is not None: return urls else: link = _getAtomLink(root) rel = link.getAttribute('rel') if rel == 'alternate': href = link.getAttribute('href') return _getSubscriptionsFromReflexiveAutoDiscovery(href, 'application/atom+xml') except: pass def _getSubscriptionsFromAtomLinkConstruct(node): try: link = _getAtomLink(node) if link.getAttribute('rel') in ('self', 'start'): href = link.getAttribute('href') return [ href] except: pass def _getSubscriptionsFromReflexiveAutoDiscovery(url, ltype): try: urls = list() html = reflexiveAutoDiscoveryOpener(url).read() for match in re.findall('<link[^>]+>', html): altMatch = re.search('rel="alternate"', match) typeMatch = re.search('type="%s"' % re.escape(ltype), match) hrefMatch = re.search('href="([^"]*)"', match) if None not in (altMatch, typeMatch, hrefMatch): href = hrefMatch.group(1) urls.append(href) continue except: urls = None if len(urls) == 0: urls = None return urls def _getAtomLink(node): return node.getElementsByTagNameNS('http://www.w3.org/2005/Atom', 'link').pop() def _getSubscriptionsFromOPMLOutline(root): try: urls = list() body = root.getElementsByTagName('body').pop() _searchOPMLNodeRecursively(body, urls) except: urls = None if len(urls) == 0: urls = None return urls def _searchOPMLNodeRecursively(node, urls): try: children = node.childNodes for child in children: if hasattr(child, 'getAttribute'): if child.hasAttribute('xmlUrl'): url = child.getAttribute('xmlUrl') urls.append(url) else: _searchOPMLNodeRecursively(child, urls) child.hasAttribute('xmlUrl') except: pass